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TER 



1 <110> APPLICANT: Austin- Phil lips , Sandra 

2 Burgess, Richard D 

3 German, Thomas L 

4 Ziegelhof f er , Thomas 

5 <12 0> TITLE OF INVENTION: Transgenic Plants as an Alternative Source of 

6 Lignocellulosic -Degrading Enzymes 

7 <130> FILE REFERENCE: Transgenic Plants Expressing Cellulase 

8 <140> CURRENT APPLICATION NUMBER: US/09/373 , 272 bii 

9 <141> CURRENT FILING DATE: 1999-08-12 

10 <150> EARLIER APPLICATION NUMBER : 08/883,495 

11 <151> EARLIER FILING DATE: 1997-06-26 

12 <160> NUMBER OF SEQ ID NOS : 32 

13 <170> SOFTWARE: Patentln Ver. 2.0 

14 <210> SEQ ID NO 1 

15 <211> LENGTH: 1621 

16 <212> TYPE: DNA 

17 <213> ORGANISM: Thermomonospora fusca 

18 <400> SEQUENCE: 1 

19 cgatatggat gatctgacgt ctgaatcccc ttgtcaccct agacattcac ccattttgtc 60 

20 gcttttacgg ctttctttgg gagttctccg tttcaccaag gaacaaaacc gcaacggaga 120 

21 gtaggcgcgg tctttacagc tcccttgcca atggttatcg tccgaacgga aaacgatctg 180 

22 ggagcgctcc cagccatgcg ctcctcttcg tgcccctcac ttcttttgag ccttgtgctc 240 

23 gttaggagcc ccgaatgtcc cccagacctc ttcgcgctct tctgggcgcc gcggcggcgg 300 

24 ccttggtcag cgcggctgct ctggccttcc ggtcgcaagc ggcggccaat gattctccgt 3 60 

25 tctacgtcaa ccccaacatg tcctccgccg aatgggtgcg gaacaacccc aacgacccgc 420 

26 gtaccccggt aatccgcgac cggatcgcca gcgtgccgca gggcacctgg ttcgcccacc 480 

27 acaaccccgg gcagatcacc ggccagatcg acgcgctcat gagcgccgcc caggccgccg 540 

28 gcaagatccc gatcctggtc gtgtacaacg ccccgggccg cgactgcggc aaccacagca 600 

29 gcggcggcgc ccccagtcac agcgcctacc ggtcctggat cgacgaattc gctgccggac 660 
3 0 tgaagaaccg tcccgcccac atcatcgtcg ggccggacct gatctcgctg atgtcgagct 720 

31 gcatccagca cgtccagcag gaagtcctgg agacgatggc gtacgcgggc aaggccctca 780 

32 aggccgggtc ctcgcaggcg cggatctact tcgacgccgg ccactccgcg tggcactcgc 840 
3 3 ccgcacagat ggcttcctgg ctccagcagg ccgacatctc caacagcgcg cacggtatcg 900 

34 ccaccaacac ctccaactac cggtggaccg ctgacgaggt cgcctacgcc aaggcggtgc 960 

35 tctcggccat cggcaacccg tccctgcgcg cggtcatcga caccagccgc aacggcaacg 1020 

36 gccccgccgg taacgagtgg tgcgacccca gcggacgcgc catcggcacg cccagcacca 1080 

37 ccaacaccgg cgacccgatg atcgacgcct tcctgtggat caagctgccg ggtgaggccg 1140 
3 8 acggctgcat cgccggcgcc ggccagttcg tcccgcaggc ggcctacgag atggcgatcg 12 00 
3 9 ccgcgggcgg caccaacccc aacccgaacc ccaacccgac gcccaccccc actccgaccc 1260 

40 ccacgccgcc tcccggctcc tcgggggcgt gcacggcgac gtacacgatc gccaacgagt 1320 

41 ggaacgacgg cttccaggcg accgtgacgg tcaccgcgaa ccagaacatc accggctgga 13 80 

42 ccgtgacatg gaccttcacc gacggccaga ccatcaccaa cgcctggaac gccgacgtgt 1440 

43 ccaccagcgg ctcctcggtg accgcgcgga acgtcggcca caacggaacg ctctcccagg 1500 

44 gagcccccac agagttcggc ttcgtcggct ctaagggcaa ctccaactct gttccgaccc 1560 
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45 



ttacctgcgc cgccagctga cccctcctgg 

g 



cagtgcactg 



ggtggcttag 



gcgtgctggg 



1620 



46 



1621 



47 <210> SEQ ID NO 2 

48 <211> LENGTH: 3503 

49 <212> TYPE: DNA 

50 <213> ORGANISM: Thermomonospora fusca 

51 <400> SEQUENCE: 2 

52 cggcgatccc cctcatcatt caggtgcggt tagttccccc aggctaccga ggaccgaatt 60 

53 tcggtccgtt tttcttgcgg cgagccctga gaccgtttcc tgttccgttc cgtcaccatc 120 

54 cttgcgcgtc ccggcggagg ggggaagcac cccgcgagat ggctccgcca cggcctgttt 180 

55 ccgacccccg tcacaaaagc ccatttaacg cggtatttac aaccggtcat gaagtggcta 240 

56 ctctcttttg ggagcgctcc cgtgccgcta gtcacactgg gacgtgaatg gcgtcacggt 300 

57 agggctcgtc gtgtgacacg cattttcgac cctgctttaa gtccctaagt gggagcgctc 360 

58 ccagccttcg ggagaactcc cacacaacca accgtccgac gccactctcc cagcgctcaa 42 0 

59 acggaggcag cagtgttcac catcccccgc tcccctccgg ggcgcccggc cgtcgtccgc 480 

60 gcaaccaccc cgaccggtcg gctgaacact gcagcgtccg gttctcgacc atccccttgc 540 

61 gagagaacat cctccaacca aggaagacac cgatatgagt aaagttcgtg ccacgaacag 600 

62 acgttcgtgg atgcggcgcg ggctggcagc cgcctctgga ctggcgcttg gcgcctccat 660 

63 ggtggcgttc gctgctccgg ccaacgccgc cggctgctcg gtgtactaca cggtcaactc 72 0 

64 ctggggtacc gggttcaccg ccaacgtcac catcaccaac ctcggcagtg cgatcaacgg 780 

65 ctggaccctg gagtgggact tccccggcaa ccagcaggtg accaacctgt ggaacgggac 840 

66 ctacacccag tccgggcagc acgtgtcggt cagcaacgcc ccgtacaacg cctccatccc 900 

67 ggccaacgga acggttgagt tcgggttcaa cggctcctac tcgggcagca acgacatccc 960 

68 ctcctccttc aagctgaacg gggttacctg cgacggctcg gacgaccccg accccgagcc 1020 

69 cagcccctcc cccagccctt cccccagccc cacagacccg gatgagccgg gcggcccgac 1080 

70 caacccgccc accaaccccg gcgagaaggt cgacaacccg ttcgagggcg ccaagctgta 1140 

71 cgtgaacccg gtctggtcgg ccaaggccgc cgctgagccg ggcggttccg cggtcgccaa 1200 

72 cgagtccacc gctgtctggc tggaccgtat cggcgggatc gagggcaacg acagcccgac 1260 

73 caccggctcc atgggtctgc gcgaccacct ggaggaggcc gtccgccagt ccggtggcga 1320 

74 cccgctgacc atccaggtcg tcatctacca cctgcccggc cgcgactgcg ccgcgctggc 1380 

75 ctccaacggt gagctgggtc ccgatgaact cgaccgctac aagagcgagt acatcgaccc 1440 

76 gatcgccgac atcatgtggg acttcgcaga ctacgagaac ctgcggatcg tcgccatcat 1500 

77 cgagatcgac tccctgccca acctcgtcac caacgtgggc gggaacggcg gcaccgagct 1560 

78 ctgcgcctac atgaagcaga acggcggcta cgtcaacggt gtcggctacg ccctccgcaa 1620 

79 gctgggcgag atcccgaacg tctacaacta catcgacgcc gcccaccacg gctggatcgg 1680 

80 ctgggactcc aacttcggcc cctcggtgga catcttctac gaggccgcca acgcctccgg 1740 

81 ctccaccgtg gactacgtgc acggcttcat ctccaacacg gccaactact cggccactgt 1800 

82 ggagccgtac ctggacgtca acggcaccgt taacggccag ctcatccgcc agtccaagtg 186 0 

83 ggttgactgg aaccagtacg tcgacgagct ctccttcgtc caggacctgc gtcaggccct 1920 

84 gatcgccaag ggcttccggt ccgacatcgg tatgctcatc gacacctccc gcaacggctg 1980 

85 gggtggcccg aaccgtccga ccggaccgag ctcctccacc gacctcaaca cctacgttga 2040 

86 cgagagccgt atcgaccgcc gtatccaccc cggtaactgg tgcaaccagg ccggtgcggg 2100 

87 cctcggcgag cggcccacgg tcaacccggc tcccggtgtt gacgcctacg tctgggtgaa 2160 

88 gcccccgggt gagtccgacg gcgccagcga ggagatcccg aacgacgagg gcaagggctt 2220 

89 cgaccgcatg tgcgacccga cctaccaggg caacgcccgc aacggcaaca acccctcgga 2280 

90 tgcgctgccc aacgccccca tctccggcca ctggttctct gcccagttcc gcgagctgct 2340 

91 ggccaacgcc tacccgcctc tgtaaagcgg agtgaggcaa cggctgacag cctcaacgag 2400 

92 gaactgatca gcacctccta gccggagacg gcgcccgtcc actccccgtg ggcgggcgcc 2460 

93 gcttttatgc cgacccgtgc cccagccgca aggggcacgg gtcggcctat tccggcgatg 2520 

94 tcggtcacgt cgccctagca cccggaaacg ccgagaaaga ctgccccgaa acggtcctct 2580 
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95 cccatccctg cattaggttg gccgagtccg cctatggctt cgtgggccgg aacccaaccc 2640 

96 accatcaacg agaggtatca ccatggccag tgtggtgaaa ttcaatgtgc tgacggttcc 2700 

97 tcccggtgcc ggcgccaccc cggaggacgt . ttgccaagcg cgcaggcctc gtggagaacc 2760 

98 gggccgggtt tcacgagttc caactgccgg cgcccggcga cgggacggac aagtacatcg 2820 

99 tctacacgcg ctggcgctcc ggagaggact accagaactg gctgaacagc gaggccttcc 2880 

100 agcgcggaca cgcccaggcc tctgaagact cccgccgcag cagccagggc ggcccggccg 2940 

101 cgtccgcgag tgaactctgg tccttcgaag tcgtccagca cgtccaggcc caggactgat 3000 

102 cccggtgcgg ccctcggttc tttaccgggg gccgcccacc cccttcatcc cttttcttct 3060 

103 cccccgcacc ccttttgatc tgcaatgatg gaattcgcga ttcttgagaa ggccgatcgt 312 0 

104 gtccatgacc gcgcagaagg caggacgacc acgcgtaccg gtcgacatcg aaggagtcaa 318 0 

105 ctgacagtgg ggactatcgc ggggctgatt gtcgcgctgt caggcgtggg gatggtctcg 3240 

106 gccaacgtgc tcccgtggga accgtcggac ccggcatccg tggtccccgc cacctcgcag 33 00 

107 ggcagcagtt ctcccatgac gccggagccc tcgcgtcccc ggtaccccca ctcgtgcgct 3360 

108 ccgtggtcga agaggtgccc agcgcaagcg gagaactgcg ggtcgtcgaa ggtgacgggg 342 0 

109 aggtcgtcgg cgaaggcacg ctcctgcgct acctggtgga ggtcgaagaa gggcttcccg 3480 

110 gagaccccgc cgacttcgct gca 3503 

111 <210> SEQ ID NO 3 

112 <211> LENGTH: 21 

113 <212> TYPE: PRT 

114 <213> ORGANISM: Artificial Sequence 

115 <220> FEATURE: 

116 <223> OTHER INFORMATION: Description of Artificial Sequence: VSP Leader 

117 Sequence 

118 <4 00> SEQUENCE: 3 

119 Met Lys Leu Phe Val Phe Phe Val Ala Ala Val Val Leu Val Ala Trp 

120 15 10 15 

121 Pro Cys His Gly Ala 

122 20 

123 <210> SEQ ID NO 4 

124 <211> LENGTH: 25 

125 <212> TYPE: DNA 

126 <213> ORGANISM: Artificial Sequence 

127 <220> FEATURE: 

128 <223> OTHER INFORMATION: Description of Artificial Sequence: Xba E2 PCR 

129 Primer 

13 0 <400> SEQUENCE: 4 

131 gctctagatg aatgattctc cgttc 25 

132 <210> SEQ ID NO 5 

133 <211> LENGTH: 17 

134 <212> TYPE: DNA 

13 5 <213> ORGANISM: Artificial Sequence 

136 <220> FEATURE: 

137 <223> OTHER INFORMATION: Description of Artificial Sequence: Xba E2 PCR 

138 Primer 

139 <400> SEQUENCE: 5 

140 tgaccggcag caaaatg 17 

141 <210> SEQ ID NO 6 

142 <211> LENGTH: 25 

143 <212> TYPE: DNA 

144 <213> ORGANISM: Artificial Sequence 
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145 <220> FEATURE: 

146 <223> OTHER INFORMATION: Description of Artificial Sequence: Xba E3 PCR 

147 Primer 

148 <400> SEQUENCE: 6 

149 gctctagatg gccggctgct cggtg 25 

150 <210> SEQ ID NO 7 

151 <211> LENGTH: 23 

152 <212> TYPE: DNA 

153 <213> ORGANISM: Artificial Sequence 

154 <220> FEATURE: 

155 <223> OTHER INFORMATION: Description of Artificial Sequence: RIE3 PCR 

156 Primer 

157 <400> SEQUENCE: 7 

158 ggaattctta cagaggcggg tag 23 

159 <210> SEQ ID NO 8 

160 <211> LENGTH: 3004 

161 <212> TYPE: DNA 

162 <213> ORGANISM: Acidothermus cellulolyticus 

163 <300> PUBLICATION INFORMATION: 

164 <400> SEQUENCE: 8 

165 ggatccacgt tgtacaaggt cacctgtccg tcgttctggt agagcggcgg gatggtcacc 60 

166 cgcacgatct ctcctttgtt gatgtcgacg gtcacgtggt tacggtttgc ctcggccgcg 120 

167 attttcgcgc tcgggcttgc tccggctgtc gggttcggtt tggcgtggtg tgcggagcac 180 

168 gccgaggcga tcccaatgag ggcaagggca agagcggagc cgatggcacg tcgggtggcc 240 

169 gatggggtac gccgatgggg cgtggcgtcc ccgccgcgga cagaaccgga tgcggaatag 300 

170 gtcacggtgc gacatgttgc cgtaccgcgg acccggatga caagggtggg tgcgcgggtc 360 

171 gcctgtgagc tgccggctgg cgtctggatc atgggaacga tcccaccatt ccccgcaatc 420 

172 gacgcgatcg ggagcagggc ggcgcgagcc ggaccgtgtg gtcgagccgg acgattcgcc 480 

173 catacggtgc tgcaatgccc agcgccatgt tgtcaatccg ccaaatgcag caatgcacac 540 

174 atggacaggg attgtgactc tgagtaatga ttggattgcc ttcttgccgc ctacgcgtta 600 

175 cgcagagtag gcgactgtat gcggtaggtt ggcgctccag ccgtgggctg gacatgcctg 660 

176 ctgcgaactc ttgacacgtc tggttgaacg cgcaatactc ccaacaccga tgggatcgtt 720 

177 cccataagtt tccgtctcac aacagaatcg gtgcgccctc atgatcaacg tgaaaggagt 780 

178 acgggggaga acagacgggg gagaaaccaa cgggggattg gcggtgccgc gcgcattgcg 840 

179 gcgagtgcct ggctcgcggg tgatgctgcg ggtcggcgtc gtcgtcgcgg tgctggcatt 900 

180 ggttgccgca ctcgccaacc tagccgtgcc gcggccggct cgcgccgcgg gcggcggcta 960 

181 ttggcacacg agcggccggg agatcctgga cgcgaacaac gtgccggtac ggatcgccgg 1020 

182 catcaactgg tttgggttcg aaacctgcaa ttacgtcgtg cacggtctct ggtcacgcga 1080 

183 ctaccgcagc atgctcgacc agataaagtc gctcggctac aacacaatcc ggctgccgta 1140 

184 ctctgacgac attctcaagc cgggcaccat gccgaacagc atcaattttt accagatgaa 1200 

185 tcaggacctg cagggtctga cgtccttgca ggtcatggac aaaatcgtcg cgtacgccgg 1260 

186 tcagatcggc ctgcgcatca ttcttgaccg ccaccgaccg gattgcagcg ggcagtcggc 1320 

187 gctgtggtac acgagcagcg tctcggaggc tacgtggatt tccgacctgc aagcgctggc 13 80 

188 gcagcgctac aagggaaacc cgacggtcgt cggctttgac ttgcacaacg agccgcatga 1440 
18 9 cccggcctgc tggggctgcg gcgatccgag catcgactgg cgattggccg ccgagcgggc 1500 

190 cggaaacgcc gtgctctcgg tgaatccgaa cctgctcatt ttcgtcgaag gtgtgcagag 1560 

191 ctacaacgga gactcctact ggtggggcgg caacctgcaa ggagccggcc agtacccggt 1620 

192 cgtgctgaac gtgccgaacc gcctggtgta ctcggcgcac gactacgcga cgagcgtcta 1680 

193 cccgcagacg tggttcagcg atccgacctt ccccaacaac atgcccggca tctggaacaa 1740 

194 gaactgggga tacctcttca atcagaacat tgcaccggta tggctgggcg aattcggtac 1800 
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195 gacactgcaa tccacgaccg accagacgtg gctgaagacg ctcgtccagt acctacggcc 1860 

196 gaccgcgcaa tacggtgcgg acagcttcca gtggaccttc tggtcctgga accccgattc 1920 

197 cggcgacaca ggaggaattc tcaaggatga ctggcagacg gtcgacacag taaaagacgg 1980 

198 ctatctcgcg ccgatcaagt cgtcgatttt cgatcctgtc ggcgcgtctg catcgcctag 2040 

199 cagtcaaccg tccccgtcgg tgtcgccgtc tccgtcgccg agcccgtcgg cgagtcggac 2100 

200 gccgacgcct actccgacgc cgacagccag cccgacgcca acgctgaccc ctactgctac 2160 

201 gcccacgccc acggcaagcc cgacgccgtc accgacggca gcctccggag cccgctgcac 2220 

202 cgcgagttac caggtcaaca gcgattgggg caatggcttc acggtaacgg tggccgtgac 2280 

203 aaattccgga tccgtcgcga ccaagacatg gacggtcagt tggacattcg gcggaaatca 2340 

204 gacgattacc aattcgtgga atgcagcggt cacgcagaac ggtcagtcgg taacggctcg 2400 

205 gaatatgagt tataacaacg tgattcagcc tggtcagaac accacgttcg gattccaggc 2460 
2 06 gagctatacc ggaagcaacg cggcaccgac agtcgcctgc gcagcaagtt aatacgtcgg 252 0 
2 07 ggagccgacg ggagggtccg gaccgtcggt tccccggctt ccacctatgg agcgaaccca 2580 

208 acaatccgga cggaactgca ggtaccagag aggaacgaca cgaatgcccg ccatctcaaa 2640 

209 acggctgcga gccggcgtcc tcgccggggc ggtgagcatc gcagcctcca tcgtgccgct 2700 

210 ggcgatgcag catcctgcca tcgccgcgac gcacgtcgac aatccctatg cgggagcgac 2760 

211 cttcttcgtc aacccgtact gggcgcaaga agtacagagc gaacggcgaa ccagaccaat 2820 

212 gccactctcg cagcgaaaat gcgcgtcgtt tccacatatt cgacggccgt ctggatggac 2880 

213 cgcatcgctg cgatcaacgg cgtcaacggc ggacccggct tgacgacata tctggacgcc 2 940 

214 gccctctccc agcagcaggg aaccacccct gaagtcattg agattgtcat ctacgatctg 3000 

215 ccgg 3004 

216 <210> SEQ ID NO 9 

217 <211> LENGTH: 2220 

218 <212> TYPE: DNA 

219 <213> ORGANISM: Trichoderma reesei 

220 <300> PUBLICATION INFORMATION: 

221 <308> DATABASE ACCESSION NUMBER: Genbank E00389 

222 <309> DATABASE ENTRY DATE: 1997-09-29 

223 <310> PATENT DOCUMENT NUMBER: JP 1985149387-A1 

224 <312> PUBLICATION DATE: 1985-08-06 

225 <400> SEQUENCE: 9 

226 aaggttagcc aagaacaata gccgataaag atagcctcat taaacggaat gagctagtag 60 

227 gcaaagtcag cgaatgtgta tatataaagg ttcgaggtcc gtgcctccct catgctctcc 120 

228 ccatctactc atcaactcag atcctccagg agacttgtac accatctttt gaggcacaga 180 

229 aacccaatag tcaaccgcgg actggcatca tgtatcggaa gttggccgtc atcacggcct 240 

230 tcttggccac agctcgtgct cagtcggcct gcactctcca atcggagact cacccgcctc 300 
2 31 tgacatggca gaaatgctcg tctggtggca cttgcactca acagacaggc tccgtggtca 3 60 

232 tcgacgccaa ctggcgctgg actcacgcta cgaacagcag cacgaactgc tacgatggca 420 

233 acacttggag ctcgacccta tgtcctgaca acgagacctg cgcgaagaac tgctgtctgg 480 

234 acggtgccgc ctacgcgtcc acgtacggag ttaccacgag cggtaacagc ctctccattg 540 

235 gctttgtcac ccagtctgcg cagaagaacg ttggcgctcg cctttacctt atggcgagcg 600 

236 acacgaccta ccaggaattc accctgcttg gcaacgagtt ctctttcgat gttgatgttt 660 

237 cgcagctgcc gtaagtgact taccatgaac ccctgacgta tcttcttgtg ggctcccagc 720 

238 tgactggcca atttaaggtg cggcttgaac ggagctctct acttcgtgtc catggacgcg 780 

239 gatggtggcg tgagcaagta tcccaccaac aacgctggcg ccaagtacgg cacggggtac 840 

240 tgtgacagcc agtgtccccg cgatctgaag ttcatcaatg gccaggccaa cgttgagggc 900 

241 tgggagccgt catccaacaa cgcaaacacg ggcattggag gacacggaag ctgctgctct 960 

242 gagatggata tctgggaggc caactccatc tccgaggctc ttacccccca cccttgcacg 1020 

243 actgtcggcc aggagatctg cgagggtgat gggtgcggcg gaacttactc cgataacaga 1080 

244 tatggcggca cttgcgatcc cgatggctgc gactggaacc cataccgcct gggcaacacc 1140 
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